[1]:
from ckg.report_manager import project
from ckg.analytics_core.analytics import analytics
from ckg.analytics_core.viz import viz
from plotly.offline import init_notebook_mode, iplot
%matplotlib inline
init_notebook_mode(connected=True)
c:\users\sande\.conda\envs\pip_rev\lib\site-packages\outdated\utils.py:18: OutdatedPackageWarning:
The package pingouin is out of date. Your version is 0.3.11, the latest is 0.3.12.
Set the environment variable OUTDATED_IGNORE=1 to disable these warnings.
WGCNA functions will not work. Module Rpy2 not installed.
R functions will not work. Module Rpy2 not installed.
[3]:
p = project.Project(identifier='P0000014')
p.build_project(force=False)
p.generate_report()
[4]:
proteomics_dataset = p.get_dataset('proteomics')
pro_processed = proteomics_dataset.get_dataframe("processed")
[5]:
pro_processed = pro_processed.drop(['sample', 'subject'], axis=1)
[6]:
pro_processed.head()
[6]:
A2M~P01023 | A30~A2MYE2 | ABI3BP~Q7Z7G0 | ACE~P12821 | ACTB~P60709 | ACTN1~P12814 | ADA2~Q9NZK5 | ADAMTS13~Q76LX8 | ADAMTSL4~Q6UY14 | ADH4~P08319 | ... | VCL~P18206 | VH6DJ~A2N0T4 | VIM~P08670 | VK3~A2N2F4 | VNN1~O95497 | VTN~P04004 | VWF~P04275 | YWHAZ~P63104 | group | scFv~Q65ZC9 | |
---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
0 | 38.005564 | 28.173504 | 21.631230 | 22.251041 | 27.090330 | 25.039968 | 23.442151 | 24.010605 | 25.085820 | 23.389032 | ... | 26.337731 | 31.159485 | 24.178889 | 25.835908 | 22.480055 | 32.815815 | 28.922779 | 22.347244 | Cirrhosis | 27.788928 |
1 | 37.309118 | 27.981907 | 27.342062 | 23.847270 | 27.461155 | 25.896268 | 23.754503 | 24.135818 | 19.400048 | 22.148706 | ... | 25.535996 | 31.994997 | 23.709777 | 25.004889 | 23.852908 | 32.722121 | 29.881279 | 22.141285 | Cirrhosis | 26.869972 |
2 | 37.384952 | 28.857627 | 21.080035 | 22.863630 | 27.929764 | 24.295225 | 23.359443 | 24.121788 | 24.923476 | 23.017163 | ... | 25.858635 | 30.139559 | 23.599064 | 26.271650 | 24.232132 | 32.755752 | 29.444625 | 21.972598 | Cirrhosis | 28.069328 |
3 | 38.417225 | 28.978380 | 25.501910 | 22.992774 | 27.152479 | 25.231288 | 23.701340 | 24.568309 | 24.878802 | 26.388112 | ... | 26.531017 | 31.977294 | 24.179076 | 25.929200 | 24.269047 | 32.714014 | 29.397176 | 22.216971 | Cirrhosis | 28.170209 |
4 | 37.471303 | 28.748744 | 20.200498 | 21.326143 | 27.537048 | 22.392992 | 22.406264 | 24.961173 | 20.480569 | 24.339540 | ... | 26.355535 | 30.485582 | 23.865224 | 26.701340 | 20.953141 | 32.722691 | 28.540895 | 18.630532 | Cirrhosis | 28.612280 |
5 rows × 510 columns
[7]:
sample_size, power_df = analytics.power_analysis(pro_processed, group='group', groups=None, alpha=0.05, power=0.8, dep_var='nobs', figure=True)
print('Sample Size: %.3f' % sample_size)
Sample Size: 50.400
[8]:
plot = viz.get_scatterplot(power_df, identifier='power', args={'x':'#samples',
'y':'power',
'name':'labels',
'group':'labels',
'x_title': 'Number of Samples',
'y_title': 'Power'
})
iplot(plot.figure)
[ ]:
[ ]: